summaryrefslogtreecommitdiffstats
path: root/src/common/x64/cpu_wait.cpp
blob: cfeef6a3d3b4d27bf9c5ddd68f53795644d338df (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
// SPDX-FileCopyrightText: Copyright 2023 yuzu Emulator Project
// SPDX-License-Identifier: GPL-2.0-or-later

#include <thread>

#ifdef _MSC_VER
#include <intrin.h>
#endif

#include "common/x64/cpu_detect.h"
#include "common/x64/cpu_wait.h"

namespace Common::X64 {

#ifdef _MSC_VER
__forceinline static u64 FencedRDTSC() {
    _mm_lfence();
    _ReadWriteBarrier();
    const u64 result = __rdtsc();
    _mm_lfence();
    _ReadWriteBarrier();
    return result;
}

__forceinline static void TPAUSE() {
    // 100,000 cycles is a reasonable amount of time to wait to save on CPU resources.
    // For reference:
    // At 1 GHz, 100K cycles is 100us
    // At 2 GHz, 100K cycles is 50us
    // At 4 GHz, 100K cycles is 25us
    static constexpr auto PauseCycles = 100'000;
    _tpause(0, FencedRDTSC() + PauseCycles);
}
#else
static u64 FencedRDTSC() {
    u64 eax;
    u64 edx;
    asm volatile("lfence\n\t"
                 "rdtsc\n\t"
                 "lfence\n\t"
                 : "=a"(eax), "=d"(edx));
    return (edx << 32) | eax;
}

static void TPAUSE() {
    // 100,000 cycles is a reasonable amount of time to wait to save on CPU resources.
    // For reference:
    // At 1 GHz, 100K cycles is 100us
    // At 2 GHz, 100K cycles is 50us
    // At 4 GHz, 100K cycles is 25us
    static constexpr auto PauseCycles = 100'000;
    const auto tsc = FencedRDTSC() + PauseCycles;
    const auto eax = static_cast<u32>(tsc & 0xFFFFFFFF);
    const auto edx = static_cast<u32>(tsc >> 32);
    asm volatile("tpause %0" : : "r"(0), "d"(edx), "a"(eax));
}
#endif

void MicroSleep() {
    static const bool has_waitpkg = GetCPUCaps().waitpkg;

    if (has_waitpkg) {
        TPAUSE();
    } else {
        std::this_thread::yield();
    }
}

} // namespace Common::X64